12#ifndef AOM_AV1_ENCODER_TPL_MODEL_H_
13#define AOM_AV1_ENCODER_TPL_MODEL_H_
23struct AV1_SEQ_CODING_TOOLS;
30#include "config/aom_config.h"
32#include "aom/aom_tpl.h"
33#include "aom_scale/yv12config.h"
34#include "aom_util/aom_pthread.h"
36#include "av1/common/mv.h"
37#include "av1/common/scale.h"
38#include "av1/encoder/av1_ext_ratectrl.h"
41#include "av1/encoder/ratectrl.h"
43static inline BLOCK_SIZE convert_length_to_bsize(
int length) {
45 case 64:
return BLOCK_64X64;
46 case 32:
return BLOCK_32X32;
47 case 16:
return BLOCK_16X16;
48 case 8:
return BLOCK_8X8;
49 case 4:
return BLOCK_4X4;
51 assert(0 &&
"Invalid block size for tpl model");
56typedef struct AV1TplRowMultiThreadSync {
59 pthread_mutex_t *mutex_;
60 pthread_cond_t *cond_;
65 int *num_finished_cols;
73 int num_threads_working;
74} AV1TplRowMultiThreadSync;
76typedef struct AV1TplRowMultiThreadInfo {
82 pthread_mutex_t *mutex_;
85 void (*sync_read_ptr)(AV1TplRowMultiThreadSync *tpl_mt_sync,
int r,
int c);
86 void (*sync_write_ptr)(AV1TplRowMultiThreadSync *tpl_mt_sync,
int r,
int c,
88} AV1TplRowMultiThreadInfo;
101#define MAX_TPL_FRAME_IDX (2 * MAX_LAG_BUFFERS)
104#define MAX_LENGTH_TPL_FRAME_STATS (MAX_TPL_FRAME_IDX + REF_FRAMES + 1)
105#define TPL_DEP_COST_SCALE_LOG2 4
107#define TPL_EPSILON 0.0000001
109typedef struct TplTxfmStats {
111 double abs_coeff_sum[256];
112 double abs_coeff_mean[256];
113 int txfm_block_count;
125typedef struct TplDepStats {
132 int64_t cmp_recrf_dist[2];
135 int64_t pred_error[INTER_REFS_PER_FRAME];
141 int32_t cmp_recrf_rate[2];
142 int_mv mv[INTER_REFS_PER_FRAME];
143 int8_t ref_frame_index[2];
146typedef struct TplDepFrame {
148 TplDepStats *tpl_stats_ptr;
149 const YV12_BUFFER_CONFIG *gf_picture;
150 YV12_BUFFER_CONFIG *rec_picture;
151 int ref_map_index[REF_FRAMES];
159 uint32_t frame_display_index;
220 struct scale_factors
sf;
239 const YV12_BUFFER_CONFIG *
ref_frame[INTER_REFS_PER_FRAME];
268#if CONFIG_BITRATE_ACCURACY || CONFIG_RATECTRL_LOG
269#define VBR_RC_INFO_MAX_FRAMES 500
272#if CONFIG_BITRATE_ACCURACY
280 double total_bit_budget;
281 int show_frame_count;
283 int gop_showframe_count;
284 double gop_bit_budget;
285 double scale_factors[FRAME_UPDATE_TYPES];
287 double mv_scale_factors[FRAME_UPDATE_TYPES];
292 int q_index_list_ready;
293 int q_index_list[VBR_RC_INFO_MAX_FRAMES];
297 double qstep_ratio_list[VBR_RC_INFO_MAX_FRAMES];
300 TplTxfmStats txfm_stats_list[VBR_RC_INFO_MAX_FRAMES];
301 FRAME_UPDATE_TYPE update_type_list[VBR_RC_INFO_MAX_FRAMES];
302 int gop_start_idx_list[VBR_RC_INFO_MAX_FRAMES];
303 int gop_length_list[VBR_RC_INFO_MAX_FRAMES];
305 int total_frame_count;
310static inline void vbr_rc_reset_gop_data(VBR_RATECTRL_INFO *vbr_rc_info) {
311 vbr_rc_info->q_index_list_ready = 0;
312 av1_zero(vbr_rc_info->q_index_list);
315void av1_vbr_rc_init(VBR_RATECTRL_INFO *vbr_rc_info,
double total_bit_budget,
316 int show_frame_count);
318int av1_vbr_rc_frame_coding_idx(
const VBR_RATECTRL_INFO *vbr_rc_info,
321void av1_vbr_rc_append_tpl_info(VBR_RATECTRL_INFO *vbr_rc_info,
322 const struct TPL_INFO *tpl_info);
324void av1_vbr_rc_set_gop_bit_budget(VBR_RATECTRL_INFO *vbr_rc_info,
325 int gop_showframe_count);
327void av1_vbr_rc_compute_q_indices(
int base_q_index,
int frame_count,
328 const double *qstep_ratio_list,
339void av1_vbr_rc_update_q_index_list(VBR_RATECTRL_INFO *vbr_rc_info,
365double av1_vbr_rc_info_estimate_gop_bitrate(
367 const double *update_type_scale_factors,
int frame_count,
368 const FRAME_UPDATE_TYPE *update_type_list,
const double *qstep_ratio_list,
369 const TplTxfmStats *stats_list,
int *q_index_list,
370 double *estimated_bitrate_byframe);
393int av1_vbr_rc_info_estimate_base_q(
395 const double *update_type_scale_factors,
int frame_count,
396 const FRAME_UPDATE_TYPE *update_type_list,
const double *qstep_ratio_list,
397 const TplTxfmStats *stats_list,
int *q_index_list,
398 double *estimated_bitrate_byframe);
406 RD_OPTION_SET_Q_RDMULT
409typedef struct RD_COMMAND {
410 RD_OPTION option_ls[MAX_LENGTH_TPL_FRAME_STATS];
411 int q_index_ls[MAX_LENGTH_TPL_FRAME_STATS];
412 int rdmult_ls[MAX_LENGTH_TPL_FRAME_STATS];
417void av1_read_rd_command(
const char *filepath, RD_COMMAND *rd_command);
420static inline bool av1_use_tpl_for_extrc(AOM_EXT_RATECTRL
const *ext_rc) {
421 return ext_rc->ready && ext_rc->funcs.send_tpl_gop_stats != NULL;
432void av1_setup_tpl_buffers(
struct AV1_PRIMARY *
const ppi,
434 int height,
int byte_alignment,
int lag_in_frames);
436static inline void tpl_dealloc_temp_buffers(TplBuffers *tpl_tmp_buffers) {
437 aom_free(tpl_tmp_buffers->predictor8);
438 tpl_tmp_buffers->predictor8 = NULL;
439 aom_free(tpl_tmp_buffers->src_diff);
440 tpl_tmp_buffers->src_diff = NULL;
441 aom_free(tpl_tmp_buffers->coeff);
442 tpl_tmp_buffers->coeff = NULL;
443 aom_free(tpl_tmp_buffers->qcoeff);
444 tpl_tmp_buffers->qcoeff = NULL;
445 aom_free(tpl_tmp_buffers->dqcoeff);
446 tpl_tmp_buffers->dqcoeff = NULL;
449static inline bool tpl_alloc_temp_buffers(TplBuffers *tpl_tmp_buffers,
450 uint8_t tpl_bsize_1d) {
452 const int tpl_block_pels = tpl_bsize_1d * tpl_bsize_1d;
455 tpl_tmp_buffers->predictor8 = (uint8_t *)aom_memalign(
456 32, tpl_block_pels * 2 *
sizeof(*tpl_tmp_buffers->predictor8));
457 tpl_tmp_buffers->src_diff = (int16_t *)aom_memalign(
458 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->src_diff));
459 tpl_tmp_buffers->coeff = (tran_low_t *)aom_memalign(
460 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->coeff));
461 tpl_tmp_buffers->qcoeff = (tran_low_t *)aom_memalign(
462 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->qcoeff));
463 tpl_tmp_buffers->dqcoeff = (tran_low_t *)aom_memalign(
464 32, tpl_block_pels *
sizeof(*tpl_tmp_buffers->dqcoeff));
466 if (!(tpl_tmp_buffers->predictor8 && tpl_tmp_buffers->src_diff &&
467 tpl_tmp_buffers->coeff && tpl_tmp_buffers->qcoeff &&
468 tpl_tmp_buffers->dqcoeff)) {
469 tpl_dealloc_temp_buffers(tpl_tmp_buffers);
491void av1_tpl_preload_rc_estimate(
494int av1_tpl_ptr_pos(
int mi_row,
int mi_col,
int stride, uint8_t right_shift);
496void av1_init_tpl_stats(
TplParams *
const tpl_data);
498int av1_tpl_stats_ready(
const TplParams *tpl_data,
int gf_frame_index);
500void av1_tpl_rdmult_setup(
struct AV1_COMP *cpi);
503 BLOCK_SIZE sb_size,
int mi_row,
int mi_col);
505void av1_mc_flow_dispenser_row(
struct AV1_COMP *cpi,
506 TplTxfmStats *tpl_txfm_stats,
508 int mi_row, BLOCK_SIZE bsize, TX_SIZE tx_size);
522double av1_exponential_entropy(
double q_step,
double b);
537double av1_laplace_entropy(
double q_step,
double b,
double zero_bin_ratio);
539#if CONFIG_BITRATE_ACCURACY
557double av1_laplace_estimate_frame_rate(
int q_index,
int block_count,
558 const double *abs_coeff_mean,
568void av1_init_tpl_txfm_stats(TplTxfmStats *tpl_txfm_stats);
570#if CONFIG_BITRATE_ACCURACY
579void av1_accumulate_tpl_txfm_stats(
const TplTxfmStats *sub_stats,
580 TplTxfmStats *accumulated_stats);
590void av1_record_tpl_txfm_block(TplTxfmStats *tpl_txfm_stats,
591 const tran_low_t *coeff);
601void av1_tpl_txfm_stats_update_abs_coeff_mean(TplTxfmStats *txfm_stats);
619double av1_estimate_coeff_entropy(
double q_step,
double b,
620 double zero_bin_ratio,
int qcoeff);
623int64_t av1_delta_rate_cost(int64_t delta_rate, int64_t recrf_dist,
624 int64_t srcrf_dist,
int pix_num);
641int av1_get_overlap_area(
int row_a,
int col_a,
int row_b,
int col_b,
int width,
653int av1_tpl_get_q_index(
const TplParams *tpl_data,
int gf_frame_index,
666double av1_tpl_get_qstep_ratio(
const TplParams *tpl_data,
int gf_frame_index);
676int av1_get_q_index_from_qstep_ratio(
int leaf_qindex,
double qstep_ratio,
693int_mv av1_compute_mv_difference(
const TplDepFrame *tpl_frame,
int row,
int col,
694 int step,
int tpl_stride,
int right_shift);
703double av1_tpl_compute_frame_mv_entropy(
const TplDepFrame *tpl_frame,
704 uint8_t right_shift);
710void av1_free_tpl_gop_stats(AomTplGopStats *extrc_tpl_gop_stats);
712#if CONFIG_RATECTRL_LOG
714 int coding_frame_count;
718 int q_index_list[VBR_RC_INFO_MAX_FRAMES];
719 double qstep_ratio_list[VBR_RC_INFO_MAX_FRAMES];
720 FRAME_UPDATE_TYPE update_type_list[VBR_RC_INFO_MAX_FRAMES];
723 TplTxfmStats txfm_stats_list[VBR_RC_INFO_MAX_FRAMES];
726 double est_coeff_rate_list[VBR_RC_INFO_MAX_FRAMES];
729 double act_rate_list[VBR_RC_INFO_MAX_FRAMES];
730 double act_coeff_rate_list[VBR_RC_INFO_MAX_FRAMES];
733static inline void rc_log_init(RATECTRL_LOG *rc_log) { av1_zero(*rc_log); }
735static inline void rc_log_frame_stats(RATECTRL_LOG *rc_log,
int coding_index,
736 const TplTxfmStats *txfm_stats) {
737 rc_log->txfm_stats_list[coding_index] = *txfm_stats;
740#if CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY
741static inline void rc_log_frame_encode_param(RATECTRL_LOG *rc_log,
743 double qstep_ratio,
int q_index,
744 FRAME_UPDATE_TYPE update_type) {
745 rc_log->qstep_ratio_list[coding_index] = qstep_ratio;
746 rc_log->q_index_list[coding_index] = q_index;
747 rc_log->update_type_list[coding_index] = update_type;
748 const TplTxfmStats *txfm_stats = &rc_log->txfm_stats_list[coding_index];
749 rc_log->est_coeff_rate_list[coding_index] = 0;
750 if (txfm_stats->ready) {
751 rc_log->est_coeff_rate_list[coding_index] = av1_laplace_estimate_frame_rate(
752 q_index, txfm_stats->txfm_block_count, txfm_stats->abs_coeff_mean,
753 txfm_stats->coeff_num);
758static inline void rc_log_frame_entropy(RATECTRL_LOG *rc_log,
int coding_index,
760 double act_coeff_rate) {
761 rc_log->act_rate_list[coding_index] = act_rate;
762 rc_log->act_coeff_rate_list[coding_index] = act_coeff_rate;
765static inline void rc_log_record_chunk_info(RATECTRL_LOG *rc_log,
767 int coding_frame_count) {
768 rc_log->base_q_index = base_q_index;
769 rc_log->coding_frame_count = coding_frame_count;
772static inline void rc_log_show(
const RATECTRL_LOG *rc_log) {
773 printf(
"= chunk 1\n");
774 printf(
"coding_frame_count %d base_q_index %d\n", rc_log->coding_frame_count,
775 rc_log->base_q_index);
776 printf(
"= frame %d\n", rc_log->coding_frame_count);
777 for (
int coding_idx = 0; coding_idx < rc_log->coding_frame_count;
780 "coding_idx %d update_type %d q %d qstep_ratio %f est_coeff_rate %f "
781 "act_coeff_rate %f act_rate %f\n",
782 coding_idx, rc_log->update_type_list[coding_idx],
783 rc_log->q_index_list[coding_idx], rc_log->qstep_ratio_list[coding_idx],
784 rc_log->est_coeff_rate_list[coding_idx],
785 rc_log->act_coeff_rate_list[coding_idx],
786 rc_log->act_rate_list[coding_idx]);
struct macroblock MACROBLOCK
Encoder's parameters related to the current coding block.
enum aom_bit_depth aom_bit_depth_t
Bit depth for codecThis enumeration determines the bit depth of the codec.
int av1_tpl_setup_stats(struct AV1_COMP *cpi, int gop_eval, const struct EncodeFrameParams *const frame_params)
Implements temporal dependency modelling for a GOP (GF/ARF group) and selects between 16 and 32 frame...
Describes look ahead buffer operations.
Top level encoder structure.
Definition encoder.h:2897
Top level primary encoder structure.
Definition encoder.h:2590
Params related to MB_MODE_INFO arrays and related info.
Definition av1_common_int.h:511
contains per-frame encoding parameters decided upon by av1_encode_strategy() and passed down to av1_e...
Definition encoder.h:3747
Data related to the current GF/ARF group and the individual frames within the group.
Definition firstpass.h:343
Params related to temporal dependency model.
Definition tpl_model.h:168
const YV12_BUFFER_CONFIG * src_ref_frame[INTER_REFS_PER_FRAME]
Definition tpl_model.h:232
struct scale_factors sf
Definition tpl_model.h:220
int ready
Definition tpl_model.h:172
TplDepFrame tpl_stats_buffer[MAX_LENGTH_TPL_FRAME_STATS]
Definition tpl_model.h:189
YV12_BUFFER_CONFIG prev_gop_arf_src
Definition tpl_model.h:244
uint8_t tpl_bsize_1d
Definition tpl_model.h:182
AV1TplRowMultiThreadSync tpl_mt_sync
Definition tpl_model.h:255
TplDepFrame * tpl_frame
Definition tpl_model.h:215
int border_in_pixels
Definition tpl_model.h:260
TplDepStats * tpl_stats_pool[MAX_LAG_BUFFERS]
Definition tpl_model.h:196
TplTxfmStats * txfm_stats_list
Definition tpl_model.h:204
int64_t prev_gop_arf_disp_order
Definition tpl_model.h:249
YV12_BUFFER_CONFIG tpl_rec_pool[MAX_LAG_BUFFERS]
Definition tpl_model.h:210
uint8_t tpl_stats_block_mis_log2
Definition tpl_model.h:177
int frame_idx
Definition tpl_model.h:225
double r0_adjust_factor
Definition tpl_model.h:265
const YV12_BUFFER_CONFIG * ref_frame[INTER_REFS_PER_FRAME]
Definition tpl_model.h:239